ABCDEFGHIJKLMNOPQRSTUVWXYZAAABACADAEAFAGAHAIAJAKALAMANAOAPAQARASATAUAVAWAXAYAZBA
1
32FeatureMAP
32 x 32
2
ping pong bram! bram = simple bramwrite a = ! write bDelay Line
3
idx012...n
4
case1case2ping
pong
bram
➡️datadatadata...data➡️pe➡️
5
write a = trueb = false)write a = trueb = false)➡️➡️➡️...➡️
6
7
bram0bram1bram0bram1
8
addrdataaddr512addrdataaddr512
9
0x005120x005120x005120x00512PE (Mac Unit)
10
write➡️0x015120x015120x015120x01512
32x32
32
11
0x025120x025120x02512write➡️0x02512int8 featureMAPint8
12
0x035120x035120x035120x03512xX⬇️
13
0x04512read➡️0x045120x04512read➡️0x04512int8 Weightint8➡️int16➡️int8
14
read➡️0x055120x05512write➡️0x055120x05512⬇️↘️result
int32
15
0x065120x065120x065120x06512= INT16int8int16+d
e
l
a
y

L
i
n
e
16
0x075120x075120x075120x07512⬇️
17
0x085120x085120x085120x08512+ result int32result
int32
18
0x095120x095120x095120x09512= result int32
19
20
21
Delay Line
22
rms norm inv sqrt
23
16bit8bit32
Weight
32x1
➡️0PEPEPEPEPEPEPE
24
rmsnorm_slope.memrmsnorm_inter.mem
25
ADDRValueAddrValue➡️PEPEPEPEPEPEPEPE
26
0x00000000477A0x100000FF
27
0x0001000047580x100104FA➡️PEPEPEPEPEPEPEPE
28
0x00020000474D0x100200FF
29
0x0003000047420x100304FA➡️PEPEPEPEPEPEPEPE
30
0x0004000047370x100400FF
31
0x00050000472C0x100504FA······
32
0x0006000047210x100610FF
33
0x0007000047160x100704FA➡️PEPEPEPEPEPEPEPE
34
0x00080000470B0x100800FF
35
0x0009000047370x100904FA➡️PEPEPEPEPEPEPEPE
36
0x00100000472C0x101000FF
37
0x0011000047210x101104FA➡️PEPEPEPEPEPEPEPE
38
0x0012000047160x101200FF
39
➡️PEPEPEPEPEPEPE1024
40
41
42
43
gelu LUT
44
result ping pong bram0O_accO_accO_accO_accO_accO_accO_acc
45
gelu table
46
addrvalueo_acc
[0,0]
32bit
o_acc
[0,1]
32bit
...o_acc
[31,31]
32bit
O_accO_accO_accO_accO_accO_accO_accO_acc
47
10x00
48
gelu_table[x]20x01O_accO_accO_accO_accO_accO_accO_accO_acc
49
=30x01⬇️ flatten
50
outputint3240x02ram⬅️O_accO_accO_accO_accO_accO_accO_accO_acc
51
3276850x02o_acc [0,0]o_acc [0,1]...
52
60x0332bit length32bit length...······
53
......
54
327680xFF⬇️ cpu(ram)으로 보내기O_accO_accO_accO_accO_accO_accO_accO_acc
55
56
O_accO_accO_accO_accO_accO_accO_accO_acc
57
58
softmaxexpunitO_accO_accO_accO_accO_accO_accO_accO_acc
59
60
O_accO_accO_accO_accO_accO_accO_acc1024